# Sub set of data dim, size = T_dev.shape[0], 10000 mask_dev = np.random.choice(dim, size, replace=False) df_T_dev = pd.DataFrame(T_dev[mask_dev, 0:3], columns=T_var[0:3]) df_T_dev['source']='dev' dim, size = T_test.shape[0], 10000 mask_test = np.sort(np.random.choice(dim, size, replace=False)) df_T_test = pd.DataFrame(T_test[mask_test, 0:3], columns=T_var[0:3]) df_T_test['source']= U_test[mask_test] for unit in np.unique(U_test[mask_test]): mask_u = np.ravel(U_test[mask_test] == unit) df_T_test.loc[mask_u, 'source'] = 'Unit ' + str(unit) df_T = pd.concat([df_T_dev, df_T_test], ignore_index=True) # Plot sns.set(font_scale=1.4) sns.pairplot(df_T, hue='source', height=4)